installing the packages

install.packages("outliers")
WARNING: Rtools is required to build R packages but is not currently installed. Please download and install the appropriate version of Rtools before proceeding:

https://cran.rstudio.com/bin/windows/Rtools/
Installing package into ‘C:/Users/Alanoud/AppData/Local/R/win-library/4.3’
(as ‘lib’ is unspecified)
trying URL 'https://cran.rstudio.com/bin/windows/contrib/4.3/outliers_0.15.zip'
Content type 'application/zip' length 84415 bytes (82 KB)
downloaded 82 KB
package ‘outliers’ successfully unpacked and MD5 sums checked

The downloaded binary packages are in
    C:\Users\Alanoud\AppData\Local\Temp\RtmpOGXNH2\downloaded_packages
install.packages("scatterplot3d") 
WARNING: Rtools is required to build R packages but is not currently installed. Please download and install the appropriate version of Rtools before proceeding:

https://cran.rstudio.com/bin/windows/Rtools/
Installing package into ‘C:/Users/Alanoud/AppData/Local/R/win-library/4.3’
(as ‘lib’ is unspecified)
trying URL 'https://cran.rstudio.com/bin/windows/contrib/4.3/scatterplot3d_0.3-44.zip'
Content type 'application/zip' length 352418 bytes (344 KB)
downloaded 344 KB
package ‘scatterplot3d’ successfully unpacked and MD5 sums checked

The downloaded binary packages are in
    C:\Users\Alanoud\AppData\Local\Temp\RtmpOGXNH2\downloaded_packages
install.packages("dplyr")
WARNING: Rtools is required to build R packages but is not currently installed. Please download and install the appropriate version of Rtools before proceeding:

https://cran.rstudio.com/bin/windows/Rtools/
Installing package into ‘C:/Users/Alanoud/AppData/Local/R/win-library/4.3’
(as ‘lib’ is unspecified)
trying URL 'https://cran.rstudio.com/bin/windows/contrib/4.3/dplyr_1.1.3.zip'
Content type 'application/zip' length 1553271 bytes (1.5 MB)
downloaded 1.5 MB
package ‘dplyr’ successfully unpacked and MD5 sums checked

The downloaded binary packages are in
    C:\Users\Alanoud\AppData\Local\Temp\RtmpOGXNH2\downloaded_packages

reading libraries and the dataset

library(outliers)
library(scatterplot3d)
library(dplyr)

library(readr)
dataset <- read_csv("GitHub/SalaryPrediction/Dataset/salary.csv")
Rows: 32561 Columns: 15── Column specification ──────────────────────────────────────────────────────────────────────
Delimiter: ","
chr (9): workclass, education, marital-status, occupation, relationship, race, sex, native...
dbl (6): age, fnlwgt, education-num, capital-gain, capital-loss, hours-per-week
ℹ Use `spec()` to retrieve the full column specification for this data.
ℹ Specify the column types or set `show_col_types = FALSE` to quiet this message.

Sample of raw dataset and summary

View(dataset)
summary(dataset)
      age         workclass             fnlwgt         education         education-num  
 Min.   :17.00   Length:32561       Min.   :  12285   Length:32561       Min.   : 1.00  
 1st Qu.:28.00   Class :character   1st Qu.: 117827   Class :character   1st Qu.: 9.00  
 Median :37.00   Mode  :character   Median : 178356   Mode  :character   Median :10.00  
 Mean   :38.58                      Mean   : 189778                      Mean   :10.08  
 3rd Qu.:48.00                      3rd Qu.: 237051                      3rd Qu.:12.00  
 Max.   :90.00                      Max.   :1484705                      Max.   :16.00  
 marital-status      occupation        relationship           race          
 Length:32561       Length:32561       Length:32561       Length:32561      
 Class :character   Class :character   Class :character   Class :character  
 Mode  :character   Mode  :character   Mode  :character   Mode  :character  
                                                                            
                                                                            
                                                                            
     sex             capital-gain    capital-loss    hours-per-week  native-country    
 Length:32561       Min.   :    0   Min.   :   0.0   Min.   : 1.00   Length:32561      
 Class :character   1st Qu.:    0   1st Qu.:   0.0   1st Qu.:40.00   Class :character  
 Mode  :character   Median :    0   Median :   0.0   Median :40.00   Mode  :character  
                    Mean   : 1078   Mean   :  87.3   Mean   :40.44                     
                    3rd Qu.:    0   3rd Qu.:   0.0   3rd Qu.:45.00                     
                    Max.   :99999   Max.   :4356.0   Max.   :99.00                     
    salary         
 Length:32561      
 Class :character  
 Mode  :character  
                   
                   
                   

Missing values

sum(is.na(dataset))
[1] 0

we noticed that there is a question mark in some values although we checked the missing values in previous part and the resault was 0 so we are going to clean them by deleting the row

dataset <- dataset[!apply(dataset == "?", 1, any), ]
print(dataset)

removing outliers

OutAge = outlier(dataset$age, logical =TRUE)
sum(OutAge)
[1] 35
Find_outlier = which(OutAge ==TRUE, arr.ind = TRUE)
OutAge
   [1] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [15] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [29] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [43] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [57] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [71] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [85] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [99] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [113] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [127] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [141] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [155] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [169] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [183] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [197] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE  TRUE FALSE FALSE FALSE
 [211] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [225] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [239] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [253] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [267] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [281] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [295] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [309] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [323] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [337] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [351] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [365] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [379] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [393] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [407] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [421] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [435] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [449] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [463] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [477] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [491] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [505] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [519] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [533] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [547] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [561] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [575] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [589] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [603] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [617] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [631] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [645] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [659] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [673] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [687] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [701] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [715] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [729] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [743] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [757] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [771] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [785] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [799] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [813] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [827] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [841] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [855] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [869] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [883] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [897] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [911] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [925] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [939] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [953] FALSE FALSE FALSE FALSE  TRUE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [967] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [981] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [995] FALSE FALSE FALSE FALSE FALSE FALSE
 [ reached getOption("max.print") -- omitted 29161 entries ]
Find_outlier
 [1]   207   957  1781  2122  2655  3735  4682  4836  4922  4954  5731  6100  8133  8288  9436
[16]  9750 10640 11094 12007 13114 14226 14721 17064 17355 17457 17810 18063 18304 19099 20589
[31] 22283 26381 28757 29901 29983
####
Outfnlwgt = outlier(dataset$fnlwgt, logical =TRUE)
sum(Outfnlwgt)
[1] 1
Find_outlier = which(Outfnlwgt ==TRUE, arr.ind = TRUE)
Outfnlwgt
   [1] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [15] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [29] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [43] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [57] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [71] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [85] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [99] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [113] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [127] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [141] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [155] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [169] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [183] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [197] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [211] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [225] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [239] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [253] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [267] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [281] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [295] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [309] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [323] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [337] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [351] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [365] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [379] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [393] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [407] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [421] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [435] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [449] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [463] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [477] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [491] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [505] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [519] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [533] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [547] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [561] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [575] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [589] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [603] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [617] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [631] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [645] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [659] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [673] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [687] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [701] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [715] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [729] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [743] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [757] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [771] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [785] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [799] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [813] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [827] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [841] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [855] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [869] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [883] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [897] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [911] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [925] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [939] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [953] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [967] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [981] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [995] FALSE FALSE FALSE FALSE FALSE FALSE
 [ reached getOption("max.print") -- omitted 29161 entries ]
###
Outeducation = outlier(dataset$`education-num`, logical =TRUE)
sum(Outeducation)
[1] 45
Find_outlier = which(Outeducation ==TRUE, arr.ind = TRUE)
Outeducation
   [1] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [15] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [29] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [43] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [57] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [71] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [85] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [99] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [113] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [127] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [141] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [155] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [169] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [183] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [197] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE  TRUE FALSE
 [211] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [225] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [239] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [253] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [267] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [281] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [295] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [309] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [323] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [337] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [351] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [365] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [379] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [393] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [407] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [421] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [435] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [449] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [463] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [477] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [491] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [505] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [519] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [533] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [547] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [561] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [575] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [589] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [603] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [617] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [631] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [645] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [659] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [673] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [687] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [701] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [715] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [729] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [743] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [757] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [771] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [785] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [799] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [813] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [827] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [841] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [855] FALSE FALSE FALSE  TRUE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [869] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [883] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [897] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [911] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [925] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [939] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [953] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [967] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [981] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [995] FALSE FALSE FALSE FALSE FALSE FALSE
 [ reached getOption("max.print") -- omitted 29161 entries ]
##

Outhours = outlier(dataset$`hours-per-week`, logical =TRUE)
sum(Outhours)
[1] 78
Find_outlier = which(Outhours ==TRUE, arr.ind = TRUE)
Outhours
   [1] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [15] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [29] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [43] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [57] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [71] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [85] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [99] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [113] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [127] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [141] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [155] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [169] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [183] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [197] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [211] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [225] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [239] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [253] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [267] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [281] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [295] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [309] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [323] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [337] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [351] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [365] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [379] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [393] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [407] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [421] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [435] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [449] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [463] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [477] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [491] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [505] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [519] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [533] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [547] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [561] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [575] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [589] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [603] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [617] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [631] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [645] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [659] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [673] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [687] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [701] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [715] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [729] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [743] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [757] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [771] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [785] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [799] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [813] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [827] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [841] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [855] FALSE FALSE FALSE FALSE FALSE FALSE  TRUE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [869] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [883] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [897] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [911] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [925] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [939] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [953] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [967] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [981] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [995] FALSE FALSE FALSE FALSE FALSE FALSE
 [ reached getOption("max.print") -- omitted 29161 entries ]
###
OutcapitalG = outlier(dataset$`capital-gain`, logical =TRUE)
sum(OutcapitalG)
[1] 148
Find_outlier = which(OutcapitalG ==TRUE, arr.ind = TRUE)
OutcapitalG
   [1] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [15] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [29] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [43] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [57] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [71] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [85] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [99] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [113] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [127] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [141] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [155] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [169] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [183] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [197] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [211] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [225] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [239] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [253] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [267] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [281] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [295] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [309] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [323] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [337] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [351] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [365] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [379] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [393] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [407] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [421] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [435] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [449] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [463] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [477] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [491] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [505] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [519] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [533] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [547] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [561] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [575] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [589] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [603] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [617] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [631] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [645] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [659] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [673] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [687] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [701] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [715] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [729] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [743] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [757] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [771] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [785] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [799] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [813] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [827] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [841] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [855] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [869] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [883] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [897] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [911] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [925] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [939] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [953] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [967] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [981] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [995] FALSE FALSE FALSE FALSE FALSE FALSE
 [ reached getOption("max.print") -- omitted 29161 entries ]
###
OutcapitalL = outlier(dataset$`capital-loss`, logical =TRUE)
sum(OutcapitalL)
[1] 2
Find_outlier = which(OutcapitalL ==TRUE, arr.ind = TRUE)
OutcapitalL
   [1] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [15] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [29] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [43] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [57] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [71] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [85] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [99] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [113] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [127] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [141] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [155] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [169] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [183] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [197] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [211] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [225] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [239] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [253] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [267] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [281] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [295] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [309] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [323] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [337] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [351] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [365] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [379] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [393] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [407] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [421] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [435] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [449] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [463] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [477] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [491] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [505] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [519] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [533] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [547] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [561] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [575] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [589] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [603] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [617] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [631] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [645] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [659] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [673] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [687] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [701] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [715] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [729] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [743] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [757] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [771] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [785] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [799] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [813] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [827] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [841] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [855] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [869] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [883] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [897] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [911] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [925] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [939] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [953] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [967] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [981] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [995] FALSE FALSE FALSE FALSE FALSE FALSE
 [ reached getOption("max.print") -- omitted 29161 entries ]
#Remove outlier
dataset= dataset[-Find_outlier,]

printing the dataset after cleaning the data

print(dataset)

Create a new column called num_salary to transform the binary attribute into numrical to use it better as it it the class label

dataset$num_salary <- ifelse(dataset$salary == ">50K", 1, 0)

Data summary

summary(dataset$age)
   Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
  17.00   28.00   37.00   38.44   47.00   90.00 
summary(dataset$`hours-per-week`)
   Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
   1.00   40.00   40.00   40.93   45.00   99.00 
summary(dataset$education)
   Length     Class      Mode 
    30159 character character 
summary(dataset$occupation)
   Length     Class      Mode 
    30159 character character 
summary(dataset$sex)
   Length     Class      Mode 
    30159 character character 
summary(dataset$salary)
   Length     Class      Mode 
    30159 character character 

variance

var(dataset$age)
[1] 172.4654
var(dataset$`hours-per-week`)
[1] 143.5168

Discretize the hours-per-week into three bins

dataset$hours_per_week_binned <- cut(dataset$`hours-per-week`, breaks = c(0, 30, 40, Inf), labels = c("Low", "Medium", "High"))
print(dataset$hours_per_week_binned)
   [1] Medium Low    Medium Medium Medium Medium Low    High   High   Medium High   Medium
  [13] Low    High   High   Medium Medium High   High   High   Low    Medium Medium Medium
  [25] Medium Medium High   Medium High   High   Medium Medium Low    Medium Medium Low   
  [37] Medium High   Medium High   Medium Medium Medium Medium Medium Medium High   Medium
  [49] High   High   High   Medium Medium Medium High   Medium Medium Medium High   High  
  [61] Medium Medium Medium High   Medium Medium High   Medium Low    Medium Medium Low   
  [73] Medium Low    Medium Medium High   Medium Medium Medium High   Medium High   Medium
  [85] Medium Low    Medium High   High   High   Medium Medium Medium High   High   Medium
  [97] Medium Medium Medium Medium Medium Medium Medium High   Low    Medium High   High  
 [109] Medium High   High   Medium High   Medium High   Medium Medium Low    Medium Medium
 [121] High   Medium Medium High   Medium Medium High   Medium Low    Medium Medium Medium
 [133] Low    Medium Medium Low    Low    Low    Medium Medium Medium Medium Medium High  
 [145] Medium Low    High   High   Medium Medium Medium Medium Medium High   Medium Low   
 [157] Low    Medium Medium Medium High   Medium Low    Medium Medium Low    High   Medium
 [169] Medium High   Medium High   Medium Medium High   Low    Low    Medium Medium High  
 [181] Low    Medium Medium High   Medium Medium Medium High   Medium Medium Medium Medium
 [193] High   Medium Low    Medium Medium Medium Medium Medium High   Medium High   High  
 [205] Medium Medium Medium Low    Medium Medium High   Low    Medium Medium Medium High  
 [217] Medium High   Medium Medium High   High   Medium Medium Low    High   Medium High  
 [229] Medium High   Medium Medium Low    Medium Low    Medium Medium Low    High   Medium
 [241] Medium High   Low    Medium Medium High   Medium High   Medium Medium Low    High  
 [253] Medium Medium Medium Medium Medium Medium High   Low    Medium High   High   Medium
 [265] Medium High   High   Medium Medium High   Medium High   High   Medium Low    High  
 [277] Medium High   Medium Low    High   Medium Medium Medium High   Medium Medium High  
 [289] Medium Medium Medium Low    Medium Medium Medium Medium Low    Medium High   High  
 [301] Medium Low    High   High   Medium High   High   Medium Medium Medium Medium High  
 [313] Medium High   Low    Medium Medium Medium Medium Low    Medium High   Low    Low   
 [325] Medium Medium Medium Low    Medium Medium Medium Medium Medium Low    Medium High  
 [337] High   High   Medium High   Low    High   Medium Low    Low    Medium Medium Medium
 [349] Low    Medium Medium Low    High   Medium High   Medium Medium Medium Low    Medium
 [361] Low    Low    Medium Medium High   Medium Medium Medium Medium High   High   Medium
 [373] Medium Medium High   Medium High   Medium Low    High   Low    Medium Medium High  
 [385] Medium High   Medium Low    Medium Medium Low    Low    Medium Medium Medium High  
 [397] Medium High   Medium Medium Medium Low    Medium High   High   Medium Medium Medium
 [409] Medium Low    Medium Medium Medium Medium Medium Medium Medium Medium High   Medium
 [421] Medium Medium Medium High   High   Medium Medium High   Medium Low    High   Medium
 [433] Medium High   Low    Medium Medium High   Low    Medium Low    Low    Medium Medium
 [445] High   Low    Low    Medium Low    High   Medium High   Medium Medium High   Low   
 [457] Low    Medium Medium Medium Medium Medium Medium Medium High   Medium Medium Low   
 [469] Medium Medium Medium High   High   High   High   Low    High   High   High   High  
 [481] High   High   Medium Medium Low    High   Medium High   Medium Medium High   High  
 [493] High   Low    Medium High   Medium Medium Medium Medium High   High   Low    Medium
 [505] Medium Medium High   Medium Medium Medium Medium Medium Medium Medium Medium High  
 [517] Medium High   Medium High   High   High   Medium Medium High   Medium Medium Low   
 [529] Medium High   Medium Medium Medium High   Medium Medium Medium Medium Low    High  
 [541] Medium High   High   High   Medium Medium Medium High   Medium High   Medium Low   
 [553] Medium Medium Medium Medium Medium Medium Medium Low    High   Medium High   Medium
 [565] Low    High   High   Medium High   High   Low    Low    Low    High   Medium High  
 [577] High   High   Medium Low    Medium Medium High   Medium High   Low    Medium High  
 [589] High   High   High   Medium Medium High   High   Medium Medium Low    Medium Low   
 [601] High   Medium High   Medium Medium High   Medium Medium Medium High   Medium Medium
 [613] Low    Medium Medium Medium Medium Medium Low    Medium High   Medium Low    Medium
 [625] High   High   High   Medium Medium Medium Low    Medium High   Medium Low    Medium
 [637] High   High   Low    Low    High   Medium Medium Low    High   Medium Low    Medium
 [649] High   High   Medium Medium Medium Low    Medium Medium Medium Medium Medium Medium
 [661] Medium Low    High   Medium High   Medium High   High   Medium Low    Medium Low   
 [673] Medium High   Low    Medium Medium High   Low    Medium Low    High   High   Medium
 [685] Low    Medium Medium Medium Medium Medium Medium Low    Medium High   Medium Medium
 [697] Medium High   Medium Medium Low    Medium Medium High   High   High   Medium Low   
 [709] High   Medium Medium Medium High   Low    Medium High   Medium High   Medium High  
 [721] High   High   High   Medium High   Low    High   Medium Medium High   Low    Medium
 [733] Medium Medium Medium Medium Low    Low    Medium Low    High   High   Medium Low   
 [745] Medium High   Medium Low    High   High   High   High   High   Medium High   Medium
 [757] Medium High   High   Medium Low    Low    Medium Medium Medium Medium Medium Medium
 [769] High   High   Low    Low    High   Medium High   Medium Medium High   High   Medium
 [781] Low    Medium High   High   Medium High   Medium Medium Medium Medium High   Low   
 [793] Medium High   High   Medium Low    Medium Low    High   Medium Medium High   Medium
 [805] Medium Low    High   Low    Medium Medium Low    Medium Medium High   High   High  
 [817] Low    Medium High   Medium Medium High   High   Medium High   High   High   Medium
 [829] High   Low    Medium High   Medium High   Low    Low    Medium Low    High   High  
 [841] Medium Medium High   High   Medium Low    Low    Low    Medium Medium Medium Medium
 [853] Medium High   High   Medium High   Medium Medium High   High   Low    Medium Low   
 [865] Medium Medium Medium Medium High   Medium Medium Medium High   Medium Medium Medium
 [877] High   Medium Low    Medium High   Medium Medium Medium High   Medium High   Medium
 [889] Medium Low    High   Low    Medium Medium Medium Medium Medium High   Medium Medium
 [901] Medium Medium Medium High   Medium High   Medium Low    Medium Medium Medium Medium
 [913] Medium Medium Low    High   High   High   High   High   Medium High   Medium High  
 [925] Medium High   Low    Medium Medium Medium High   High   Medium Medium Medium High  
 [937] Low    Medium Medium Medium Medium High   Medium Low    Medium Medium High   High  
 [949] Medium High   Medium Low    Medium Medium High   Low    Medium Medium Medium High  
 [961] Medium High   Medium High   High   Medium Medium Medium High   Medium Medium High  
 [973] Medium Medium High   Medium Medium Medium Medium High   Medium High   Medium High  
 [985] High   Low    Medium High   High   Low    Low    Medium High   Medium Medium Medium
 [997] Medium High   Medium Medium
 [ reached getOption("max.print") -- omitted 29159 entries ]
Levels: Low Medium High

histograms

hist(dataset$age)

hist(dataset$num_salary)

hist(dataset$fnlwgt)

hist(dataset$`education-num`)

hist(dataset$`capital-gain`)

hist(dataset$`capital-loss`)

hist(dataset$`hours-per-week`)

bar plots

barplot(table(dataset$workclass))

barplot(table(dataset$education))

barplot(table(dataset$`marital-status`))

barplot(table(dataset$occupation))

barplot(table(dataset$relationship))

barplot(table(dataset$race))

barplot(table(dataset$sex))

barplot(table(dataset$`native-country`))

barplot(table(dataset$salary))

box plot

boxplot(age~ salary, data = dataset)

boxplot(`hours-per-week`~ salary, data = dataset)

scatter plot

scatterplot3d(dataset$num_salary,dataset$age, dataset$`hours-per-week`)

pie chart for the salary attribute

tab <- dataset$salary %>% table()
precentages <- tab %>% prop.table() %>% round(3) * 100 
txt <- paste0(names(tab), '\n', precentages, '%') 
pie(tab, labels=txt)

Normalization

dataWithoutNormalization <- dataset
print(dataWithoutNormalization)
#Define function normalize().
normalize <- function(x) {return ((x - min(x)) / (max(x) - min(x)))}
#Define function Z_normalize().
Z_normalize <- function(x) {return ((x - mean(x)) / sd(x))}

#Call normalize funcrtion 
dataset$age<-normalize(dataWithoutNormalization$age)
print(dataset)

#Call Z_normalize funcrtion 
dataset$age<-Z_normalize(dataWithoutNormalization$age)
print(dataset)

######################################

#Call normalize funcrtion 
dataset$fnlwgt<-normalize(dataWithoutNormalization$fnlwgt)
print(dataset)

#Call Z_normalize funcrtion 
dataset$fnlwgt<-Z_normalize(dataWithoutNormalization$fnlwgt)
print(dataset)

######################################

#Call normalize funcrtion 
dataset$`education-num`<-normalize(dataWithoutNormalization$`education-num`)
print(dataset)

#Call Z_normalize funcrtion 
dataset$`education-num`<-Z_normalize(dataWithoutNormalization$`education-num`)
print(dataset)

######################################



#Call normalize funcrtion 
dataset$`hours-per-week`<-normalize(dataWithoutNormalization$`hours-per-week`)
print(dataset)

#Call Z_normalize funcrtion 
dataset$`hours-per-week`<-Z_normalize(dataWithoutNormalization$`hours-per-week`)
print(dataset)

######################################

#Call normalize funcrtion 
dataset$`capital-gain`<-normalize(dataWithoutNormalization$`capital-gain`)
print(dataset)

#Call Z_normalize funcrtion 
dataset$`capital-gain`<-Z_normalize(dataWithoutNormalization$`capital-gain`)
print(dataset)

######################################

#Call normalize funcrtion 
dataset$`capital-loss`<-normalize(dataWithoutNormalization$`capital-loss`)
print(dataset)

#Call Z_normalize funcrtion 
dataset$`capital-loss`<-Z_normalize(dataWithoutNormalization$`capital-loss`)
print(dataset)
NA
LS0tDQp0aXRsZTogInBoYXNlIDEiDQpvdXRwdXQ6IGh0bWxfbm90ZWJvb2sNCi0tLQ0KDQppbnN0YWxsaW5nIHRoZSBwYWNrYWdlcw0KYGBge3J9DQppbnN0YWxsLnBhY2thZ2VzKCJvdXRsaWVycyIpDQppbnN0YWxsLnBhY2thZ2VzKCJzY2F0dGVycGxvdDNkIikgDQppbnN0YWxsLnBhY2thZ2VzKCJkcGx5ciIpDQoNCmBgYA0KcmVhZGluZyBsaWJyYXJpZXMgYW5kIHRoZSBkYXRhc2V0DQpgYGB7cn0NCmxpYnJhcnkob3V0bGllcnMpDQpsaWJyYXJ5KHNjYXR0ZXJwbG90M2QpDQpsaWJyYXJ5KGRwbHlyKQ0KDQpsaWJyYXJ5KHJlYWRyKQ0KZGF0YXNldCA8LSByZWFkX2NzdigiR2l0SHViL1NhbGFyeVByZWRpY3Rpb24vRGF0YXNldC9zYWxhcnkuY3N2IikNCmBgYA0KU2FtcGxlIG9mIHJhdyBkYXRhc2V0IGFuZCBzdW1tYXJ5IA0KYGBge3J9DQpWaWV3KGRhdGFzZXQpDQpzdW1tYXJ5KGRhdGFzZXQpDQpgYGANCiBNaXNzaW5nIHZhbHVlcw0KYGBge3J9DQpzdW0oaXMubmEoZGF0YXNldCkpDQpgYGANCiB3ZSBub3RpY2VkIHRoYXQgdGhlcmUgaXMgYSBxdWVzdGlvbiBtYXJrIGluIHNvbWUgdmFsdWVzIGFsdGhvdWdoIHdlIGNoZWNrZWQgdGhlIG1pc3NpbmcgdmFsdWVzIGluIHByZXZpb3VzIHBhcnQgYW5kIHRoZSByZXNhdWx0IHdhcyAwIHNvIHdlIGFyZSBnb2luZyB0byBjbGVhbiB0aGVtIGJ5IGRlbGV0aW5nIHRoZSByb3cNCmBgYHtyfQ0KZGF0YXNldCA8LSBkYXRhc2V0WyFhcHBseShkYXRhc2V0ID09ICI/IiwgMSwgYW55KSwgXQ0KcHJpbnQoZGF0YXNldCkNCmBgYA0KcmVtb3Zpbmcgb3V0bGllcnMNCmBgYHtyfQ0KT3V0QWdlID0gb3V0bGllcihkYXRhc2V0JGFnZSwgbG9naWNhbCA9VFJVRSkNCnN1bShPdXRBZ2UpDQpGaW5kX291dGxpZXIgPSB3aGljaChPdXRBZ2UgPT1UUlVFLCBhcnIuaW5kID0gVFJVRSkNCk91dEFnZQ0KRmluZF9vdXRsaWVyDQojIyMjDQpPdXRmbmx3Z3QgPSBvdXRsaWVyKGRhdGFzZXQkZm5sd2d0LCBsb2dpY2FsID1UUlVFKQ0Kc3VtKE91dGZubHdndCkNCkZpbmRfb3V0bGllciA9IHdoaWNoKE91dGZubHdndCA9PVRSVUUsIGFyci5pbmQgPSBUUlVFKQ0KT3V0Zm5sd2d0DQojIyMNCk91dGVkdWNhdGlvbiA9IG91dGxpZXIoZGF0YXNldCRgZWR1Y2F0aW9uLW51bWAsIGxvZ2ljYWwgPVRSVUUpDQpzdW0oT3V0ZWR1Y2F0aW9uKQ0KRmluZF9vdXRsaWVyID0gd2hpY2goT3V0ZWR1Y2F0aW9uID09VFJVRSwgYXJyLmluZCA9IFRSVUUpDQpPdXRlZHVjYXRpb24NCiMjDQoNCk91dGhvdXJzID0gb3V0bGllcihkYXRhc2V0JGBob3Vycy1wZXItd2Vla2AsIGxvZ2ljYWwgPVRSVUUpDQpzdW0oT3V0aG91cnMpDQpGaW5kX291dGxpZXIgPSB3aGljaChPdXRob3VycyA9PVRSVUUsIGFyci5pbmQgPSBUUlVFKQ0KT3V0aG91cnMNCiMjIw0KT3V0Y2FwaXRhbEcgPSBvdXRsaWVyKGRhdGFzZXQkYGNhcGl0YWwtZ2FpbmAsIGxvZ2ljYWwgPVRSVUUpDQpzdW0oT3V0Y2FwaXRhbEcpDQpGaW5kX291dGxpZXIgPSB3aGljaChPdXRjYXBpdGFsRyA9PVRSVUUsIGFyci5pbmQgPSBUUlVFKQ0KT3V0Y2FwaXRhbEcNCiMjIw0KT3V0Y2FwaXRhbEwgPSBvdXRsaWVyKGRhdGFzZXQkYGNhcGl0YWwtbG9zc2AsIGxvZ2ljYWwgPVRSVUUpDQpzdW0oT3V0Y2FwaXRhbEwpDQpGaW5kX291dGxpZXIgPSB3aGljaChPdXRjYXBpdGFsTCA9PVRSVUUsIGFyci5pbmQgPSBUUlVFKQ0KT3V0Y2FwaXRhbEwNCg0KDQojUmVtb3ZlIG91dGxpZXINCmRhdGFzZXQ9IGRhdGFzZXRbLUZpbmRfb3V0bGllcixdDQoNCmBgYA0KcHJpbnRpbmcgdGhlIGRhdGFzZXQgYWZ0ZXIgY2xlYW5pbmcgdGhlIGRhdGENCmBgYHtyfQ0KcHJpbnQoZGF0YXNldCkNCmBgYA0KDQpDcmVhdGUgYSBuZXcgY29sdW1uIGNhbGxlZCBudW1fc2FsYXJ5IHRvIHRyYW5zZm9ybSB0aGUgYmluYXJ5IGF0dHJpYnV0ZSBpbnRvIG51bXJpY2FsIHRvIHVzZSBpdCBiZXR0ZXIgYXMgaXQgaXQgdGhlIGNsYXNzIGxhYmVsDQpgYGB7cn0NCmRhdGFzZXQkbnVtX3NhbGFyeSA8LSBpZmVsc2UoZGF0YXNldCRzYWxhcnkgPT0gIj41MEsiLCAxLCAwKQ0KDQpgYGANCkRhdGEgc3VtbWFyeQ0KYGBge3J9DQpzdW1tYXJ5KGRhdGFzZXQkYWdlKQ0Kc3VtbWFyeShkYXRhc2V0JGBob3Vycy1wZXItd2Vla2ApDQpzdW1tYXJ5KGRhdGFzZXQkZWR1Y2F0aW9uKQ0Kc3VtbWFyeShkYXRhc2V0JG9jY3VwYXRpb24pDQpzdW1tYXJ5KGRhdGFzZXQkc2V4KQ0Kc3VtbWFyeShkYXRhc2V0JHNhbGFyeSkNCmBgYA0KdmFyaWFuY2UgDQpgYGB7cn0NCnZhcihkYXRhc2V0JGFnZSkNCnZhcihkYXRhc2V0JGBob3Vycy1wZXItd2Vla2ApDQpgYGANCkRpc2NyZXRpemUgdGhlIGhvdXJzLXBlci13ZWVrIGludG8gdGhyZWUgYmlucw0KYGBge3J9DQpkYXRhc2V0JGhvdXJzX3Blcl93ZWVrX2Jpbm5lZCA8LSBjdXQoZGF0YXNldCRgaG91cnMtcGVyLXdlZWtgLCBicmVha3MgPSBjKDAsIDMwLCA0MCwgSW5mKSwgbGFiZWxzID0gYygiTG93IiwgIk1lZGl1bSIsICJIaWdoIikpDQpwcmludChkYXRhc2V0JGhvdXJzX3Blcl93ZWVrX2Jpbm5lZCkNCmBgYA0KaGlzdG9ncmFtcw0KYGBge3J9DQpoaXN0KGRhdGFzZXQkYWdlKQ0KaGlzdChkYXRhc2V0JG51bV9zYWxhcnkpDQpoaXN0KGRhdGFzZXQkZm5sd2d0KQ0KaGlzdChkYXRhc2V0JGBlZHVjYXRpb24tbnVtYCkNCmhpc3QoZGF0YXNldCRgY2FwaXRhbC1nYWluYCkNCmhpc3QoZGF0YXNldCRgY2FwaXRhbC1sb3NzYCkNCmhpc3QoZGF0YXNldCRgaG91cnMtcGVyLXdlZWtgKQ0KYGBgDQoNCmJhciBwbG90cyANCmBgYHtyfQ0KYmFycGxvdCh0YWJsZShkYXRhc2V0JHdvcmtjbGFzcykpDQpiYXJwbG90KHRhYmxlKGRhdGFzZXQkZWR1Y2F0aW9uKSkNCmJhcnBsb3QodGFibGUoZGF0YXNldCRgbWFyaXRhbC1zdGF0dXNgKSkNCmJhcnBsb3QodGFibGUoZGF0YXNldCRvY2N1cGF0aW9uKSkNCmJhcnBsb3QodGFibGUoZGF0YXNldCRyZWxhdGlvbnNoaXApKQ0KYmFycGxvdCh0YWJsZShkYXRhc2V0JHJhY2UpKQ0KYmFycGxvdCh0YWJsZShkYXRhc2V0JHNleCkpDQpiYXJwbG90KHRhYmxlKGRhdGFzZXQkYG5hdGl2ZS1jb3VudHJ5YCkpDQpiYXJwbG90KHRhYmxlKGRhdGFzZXQkc2FsYXJ5KSkNCmBgYA0KDQogYm94IHBsb3QNCmBgYHtyfQ0KYm94cGxvdChhZ2V+IHNhbGFyeSwgZGF0YSA9IGRhdGFzZXQpDQpib3hwbG90KGBob3Vycy1wZXItd2Vla2B+IHNhbGFyeSwgZGF0YSA9IGRhdGFzZXQpDQpgYGANCg0Kc2NhdHRlciBwbG90DQpgYGB7cn0NCnNjYXR0ZXJwbG90M2QoZGF0YXNldCRudW1fc2FsYXJ5LGRhdGFzZXQkYWdlLCBkYXRhc2V0JGBob3Vycy1wZXItd2Vla2ApDQpgYGANCg0KcGllIGNoYXJ0IGZvciB0aGUgc2FsYXJ5IGF0dHJpYnV0ZQ0KYGBge3J9DQp0YWIgPC0gZGF0YXNldCRzYWxhcnkgJT4lIHRhYmxlKCkNCnByZWNlbnRhZ2VzIDwtIHRhYiAlPiUgcHJvcC50YWJsZSgpICU+JSByb3VuZCgzKSAqIDEwMCANCnR4dCA8LSBwYXN0ZTAobmFtZXModGFiKSwgJ1xuJywgcHJlY2VudGFnZXMsICclJykgDQpwaWUodGFiLCBsYWJlbHM9dHh0KQ0KYGBgDQoNCk5vcm1hbGl6YXRpb24NCmBgYHtyfQ0KZGF0YVdpdGhvdXROb3JtYWxpemF0aW9uIDwtIGRhdGFzZXQNCnByaW50KGRhdGFXaXRob3V0Tm9ybWFsaXphdGlvbikNCiNEZWZpbmUgZnVuY3Rpb27CoG5vcm1hbGl6ZSgpLg0Kbm9ybWFsaXplIDwtIGZ1bmN0aW9uKHgpIHtyZXR1cm4gKCh4IC0gbWluKHgpKSAvIChtYXgoeCkgLSBtaW4oeCkpKX0NCiNEZWZpbmUgZnVuY3Rpb27CoFpfbm9ybWFsaXplKCkuDQpaX25vcm1hbGl6ZSA8LSBmdW5jdGlvbih4KSB7cmV0dXJuICgoeCAtIG1lYW4oeCkpIC8gc2QoeCkpfQ0KDQojQ2FsbCBub3JtYWxpemUgZnVuY3J0aW9uIA0KZGF0YXNldCRhZ2U8LW5vcm1hbGl6ZShkYXRhV2l0aG91dE5vcm1hbGl6YXRpb24kYWdlKQ0KcHJpbnQoZGF0YXNldCkNCg0KI0NhbGwgWl9ub3JtYWxpemUgZnVuY3J0aW9uIA0KZGF0YXNldCRhZ2U8LVpfbm9ybWFsaXplKGRhdGFXaXRob3V0Tm9ybWFsaXphdGlvbiRhZ2UpDQpwcmludChkYXRhc2V0KQ0KDQojIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIw0KDQojQ2FsbCBub3JtYWxpemUgZnVuY3J0aW9uIA0KZGF0YXNldCRmbmx3Z3Q8LW5vcm1hbGl6ZShkYXRhV2l0aG91dE5vcm1hbGl6YXRpb24kZm5sd2d0KQ0KcHJpbnQoZGF0YXNldCkNCg0KI0NhbGwgWl9ub3JtYWxpemUgZnVuY3J0aW9uIA0KZGF0YXNldCRmbmx3Z3Q8LVpfbm9ybWFsaXplKGRhdGFXaXRob3V0Tm9ybWFsaXphdGlvbiRmbmx3Z3QpDQpwcmludChkYXRhc2V0KQ0KDQojIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIw0KDQojQ2FsbCBub3JtYWxpemUgZnVuY3J0aW9uIA0KZGF0YXNldCRgZWR1Y2F0aW9uLW51bWA8LW5vcm1hbGl6ZShkYXRhV2l0aG91dE5vcm1hbGl6YXRpb24kYGVkdWNhdGlvbi1udW1gKQ0KcHJpbnQoZGF0YXNldCkNCg0KI0NhbGwgWl9ub3JtYWxpemUgZnVuY3J0aW9uIA0KZGF0YXNldCRgZWR1Y2F0aW9uLW51bWA8LVpfbm9ybWFsaXplKGRhdGFXaXRob3V0Tm9ybWFsaXphdGlvbiRgZWR1Y2F0aW9uLW51bWApDQpwcmludChkYXRhc2V0KQ0KDQojIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIw0KDQoNCg0KI0NhbGwgbm9ybWFsaXplIGZ1bmNydGlvbiANCmRhdGFzZXQkYGhvdXJzLXBlci13ZWVrYDwtbm9ybWFsaXplKGRhdGFXaXRob3V0Tm9ybWFsaXphdGlvbiRgaG91cnMtcGVyLXdlZWtgKQ0KcHJpbnQoZGF0YXNldCkNCg0KI0NhbGwgWl9ub3JtYWxpemUgZnVuY3J0aW9uIA0KZGF0YXNldCRgaG91cnMtcGVyLXdlZWtgPC1aX25vcm1hbGl6ZShkYXRhV2l0aG91dE5vcm1hbGl6YXRpb24kYGhvdXJzLXBlci13ZWVrYCkNCnByaW50KGRhdGFzZXQpDQoNCiMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjDQoNCiNDYWxsIG5vcm1hbGl6ZSBmdW5jcnRpb24gDQpkYXRhc2V0JGBjYXBpdGFsLWdhaW5gPC1ub3JtYWxpemUoZGF0YVdpdGhvdXROb3JtYWxpemF0aW9uJGBjYXBpdGFsLWdhaW5gKQ0KcHJpbnQoZGF0YXNldCkNCg0KI0NhbGwgWl9ub3JtYWxpemUgZnVuY3J0aW9uIA0KZGF0YXNldCRgY2FwaXRhbC1nYWluYDwtWl9ub3JtYWxpemUoZGF0YVdpdGhvdXROb3JtYWxpemF0aW9uJGBjYXBpdGFsLWdhaW5gKQ0KcHJpbnQoZGF0YXNldCkNCg0KIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMNCg0KI0NhbGwgbm9ybWFsaXplIGZ1bmNydGlvbiANCmRhdGFzZXQkYGNhcGl0YWwtbG9zc2A8LW5vcm1hbGl6ZShkYXRhV2l0aG91dE5vcm1hbGl6YXRpb24kYGNhcGl0YWwtbG9zc2ApDQpwcmludChkYXRhc2V0KQ0KDQojQ2FsbCBaX25vcm1hbGl6ZSBmdW5jcnRpb24gDQpkYXRhc2V0JGBjYXBpdGFsLWxvc3NgPC1aX25vcm1hbGl6ZShkYXRhV2l0aG91dE5vcm1hbGl6YXRpb24kYGNhcGl0YWwtbG9zc2ApDQpwcmludChkYXRhc2V0KQ0KDQpgYGANCg0K